hr_ml_agent_bench/baseline/gpt-4-1106-preview:
  class: evals.elsuite.hr_ml_agent_bench.solvers.baseline:OpenAIChatSolver
  args:
    completion_fn_kwargs:
      model: gpt-4-1106-preview

hr_ml_agent_bench/baseline/gpt-3.5-turbo-16k:
  class: evals.elsuite.hr_ml_agent_bench.solvers.baseline:OpenAIChatSolver
  args:
    completion_fn_kwargs:
      model: gpt-3.5-turbo-16k

hr_ml_agent_bench/direct/gpt-4-1106-preview:
  class: evals.solvers.providers.openai.openai_solver:OpenAISolver
  args:
    completion_fn_options:
      model: gpt-4-1106-preview
      extra_options:
        temperature: 1
        max_tokens: 4096

hr_ml_agent_bench/cot/gpt-4-1106-preview:
  class: evals.solvers.nested.cot_solver:CoTSolver
  args:
    cot_solver:
      class: evals.solvers.providers.openai.openai_solver:OpenAISolver
      args:
        completion_fn_options:
          model: gpt-4-1106-preview
          extra_options:
            temperature: 1
            max_tokens: 4096
    extract_solver:
      class: evals.solvers.providers.openai.openai_solver:OpenAISolver
      args:
        completion_fn_options:
          model: gpt-4-1106-preview
          extra_options:
            temperature: 1
            max_tokens: 512
